\relax 
\citation{SMT:Koehn2010}
\citation{Mcnamee:2006}
\citation{Mcnamee:2006}
\citation{Gerdemann:2010}
\select@language{UKenglish}
\@writefile{toc}{\select@language{UKenglish}}
\@writefile{lof}{\select@language{UKenglish}}
\@writefile{lot}{\select@language{UKenglish}}
\citation{Mcnamee:2006}
\citation{Gerdemann:2010}
\@writefile{toc}{\contentsline {section}{\tocsection {}{}{Introduction}}{5}}
\@writefile{toc}{\contentsline {part}{\tocpart {Part}{1}{Repeats}}{6}}
\@writefile{toc}{\contentsline {section}{\tocsection {}{1}{Continuous Repeats}}{6}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{1.1}{Sequences}}{6}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{1.2}{Continuous Repeats}}{8}}
\newlabel{def:left-max}{{1.11}{9}}
\citation{DBLP:journals/siamcomp/ManberM93}
\citation{DBLP:journals/jda/AbouelhodaKO04}
\citation{DBLP:journals/algorithmica/KimKP08}
\@writefile{toc}{\contentsline {section}{\tocsection {}{2}{Discovering Continuous Repeats}}{11}}
\@writefile{lof}{\contentsline {figure}{\numberline {1}{\ignorespaces The suffixes of the sequence $S$ sorted by index.\relax }}{11}}
\providecommand*\caption@xref[2]{\@setref\relax\@undefined{#1}}
\newlabel{fig:suffixes}{{1}{11}}
\citation{DBLP:books/daglib/0020103}
\citation{Karkkainen:2006}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.1}{Suffix Table}}{12}}
\@writefile{lof}{\contentsline {figure}{\numberline {2}{\ignorespaces The $suftab$ array for the sequence $S$.\relax }}{12}}
\newlabel{fig:suftab}{{2}{12}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.2}{Longest Common Prefix Table}}{13}}
\@writefile{lof}{\contentsline {figure}{\numberline {3}{\ignorespaces The $lcptab$ array for the sequence $S$.\relax }}{13}}
\newlabel{fig:lcptab}{{3}{13}}
\citation{DBLP:conf/cpm/KasaiLAAP01}
\citation{DBLP:journals/siamcomp/ManberM93}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.3}{\emph  {lcp-interval}}}{14}}
\newlabel{def:lcpi}{{2.3}{14}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.4}{Suffix Array}}{15}}
\@writefile{lof}{\contentsline {figure}{\numberline {4}{\ignorespaces The suffix array for the sequence $S$.\relax }}{15}}
\newlabel{fig:sa}{{4}{15}}
\@writefile{lot}{\contentsline {table}{\numberline {1}{\ignorespaces Suffix array properties.\relax }}{15}}
\newlabel{tab:sa}{{1}{15}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.5}{\emph  {lcp-interval} Tree}}{15}}
\@writefile{lof}{\contentsline {figure}{\numberline {5}{\ignorespaces The lcp-interval tree with the $suftab$ and the $lcptab$ for the sequence $S$.\relax }}{16}}
\newlabel{fig:itree}{{5}{16}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.6}{Using an \emph  {lcp-interval} Tree to Discover Repeats}}{16}}
\citation{DBLP:conf/focs/Weiner73}
\citation{McCreight:1976:SST:321941.321946}
\citation{ukkonen1995:suffix}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.7}{Suffix Tree}}{17}}
\citation{DBLP:journals/jda/AbouelhodaKO04}
\citation{DBLP:journals/jda/AbouelhodaKO04}
\@writefile{lof}{\contentsline {figure}{\numberline {6}{\ignorespaces The suffix tree for the sequence $S$.\relax }}{18}}
\newlabel{fig:stree}{{6}{18}}
\@writefile{lot}{\contentsline {table}{\numberline {2}{\ignorespaces Suffix tree properties.\relax }}{18}}
\newlabel{tab:st}{{2}{18}}
\@writefile{lot}{\contentsline {table}{\numberline {3}{\ignorespaces Enhanced suffix array properties.\relax }}{19}}
\newlabel{tab:esa}{{3}{19}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.8}{Enhanced Suffix Array}}{19}}
\@writefile{lof}{\contentsline {figure}{\numberline {7}{\ignorespaces The enhanced suffix array for the sequence $S$.\relax }}{19}}
\newlabel{fig:esa}{{7}{19}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.9}{Child Table}}{19}}
\citation{Burrows94ablock-sorting}
\@writefile{lof}{\contentsline {figure}{\numberline {8}{\ignorespaces lcp-interval tree traversal using the $cldtab$: level 0.\relax }}{20}}
\newlabel{fig:cldtab0}{{8}{20}}
\@writefile{lof}{\contentsline {figure}{\numberline {9}{\ignorespaces lcp-interval tree traversal using the $cldtab$: level 1.\relax }}{21}}
\newlabel{fig:cldtab1}{{9}{21}}
\@writefile{lof}{\contentsline {figure}{\numberline {10}{\ignorespaces lcp-interval tree traversal using the $cldtab$: level 2.\relax }}{21}}
\newlabel{fig:cldtab2}{{10}{21}}
\@writefile{lof}{\contentsline {figure}{\numberline {11}{\ignorespaces lcp-interval tree traversal using the $cldtab$: level 3.\relax }}{21}}
\newlabel{fig:cldtab3}{{11}{21}}
\@writefile{lof}{\contentsline {figure}{\numberline {12}{\ignorespaces lcp-interval tree traversal using the $cldtab$: complete tree.\relax }}{21}}
\newlabel{fig:cldtab4}{{12}{21}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.10}{Burrows--Wheeler Transform Table}}{21}}
\citation{DBLP:journals/algorithmica/KimKP08}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.11}{Linearised Suffix Tree}}{22}}
\@writefile{lot}{\contentsline {table}{\numberline {4}{\ignorespaces Linearised suffix tree properties.\relax }}{22}}
\newlabel{tab:lst}{{4}{22}}
\@writefile{lof}{\contentsline {figure}{\numberline {13}{\ignorespaces Using Burrows-Wheeler transform table to find maximal repeats.\relax }}{23}}
\newlabel{fig:bwttab}{{13}{23}}
\@writefile{lof}{\contentsline {figure}{\numberline {14}{\ignorespaces The linearized suffix tree for the sequence $S$\relax }}{24}}
\newlabel{fig:lst}{{14}{24}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{2.12}{New Child Table}}{24}}
\@writefile{lof}{\contentsline {figure}{\numberline {15}{\ignorespaces Binary lcp-interval tree traversal using the \textit  {newcldtab}: level 0.\relax }}{25}}
\newlabel{fig:newcldtab0}{{15}{25}}
\@writefile{lof}{\contentsline {figure}{\numberline {16}{\ignorespaces Binary lcp-interval tree traversal using the \textit  {newcldtab}: level 1.\relax }}{25}}
\newlabel{fig:newcldtab1}{{16}{25}}
\@writefile{lof}{\contentsline {figure}{\numberline {17}{\ignorespaces Binary lcp-interval tree traversal using the \textit  {newcldtab}: level 2.\relax }}{25}}
\newlabel{fig:newcldtab2}{{17}{25}}
\@writefile{lof}{\contentsline {figure}{\numberline {18}{\ignorespaces Binary lcp-interval tree traversal using the \textit  {newcldtab}: level 3.\relax }}{26}}
\newlabel{fig:newcldtab3}{{18}{26}}
\@writefile{lof}{\contentsline {figure}{\numberline {19}{\ignorespaces Binary lcp-interval tree traversal using the \textit  {newcldtab}: level 4.\relax }}{26}}
\newlabel{fig:newcldtab4}{{19}{26}}
\@writefile{lof}{\contentsline {figure}{\numberline {20}{\ignorespaces Binary lcp-interval tree traversal using the \textit  {newcldtab}: level 5.\relax }}{26}}
\newlabel{fig:newcldtab5}{{20}{26}}
\@writefile{lof}{\contentsline {figure}{\numberline {21}{\ignorespaces Binary lcp-interval tree traversal using the \textit  {newcldtab}: level 6.\relax }}{27}}
\newlabel{fig:newcldtab6}{{21}{27}}
\@writefile{lof}{\contentsline {figure}{\numberline {22}{\ignorespaces Binary lcp-interval tree traversal using the \textit  {newcldtab}: level 7.\relax }}{27}}
\newlabel{fig:newcldtab7}{{22}{27}}
\@writefile{lof}{\contentsline {figure}{\numberline {23}{\ignorespaces Binary lcp-interval tree traversal using the \textit  {newcldtab}: complete tree.\relax }}{28}}
\newlabel{fig:newcldtab8}{{23}{28}}
\@writefile{lof}{\contentsline {figure}{\numberline {24}{\ignorespaces The binary lcp-interval tree with the $suftab$ and the $lcptab$ for the sequence $S$.\relax }}{29}}
\newlabel{fig:bitree}{{24}{29}}
\@writefile{toc}{\contentsline {section}{\tocsection {}{3}{Discontinuous Repeats}}{30}}
\newlabel{def:dseqeq}{{3.5}{31}}
\citation{Gerdemann:2010}
\@writefile{toc}{\contentsline {section}{\tocsection {}{4}{Discovering Discontinuous Repeats}}{32}}
\@writefile{lof}{\contentsline {figure}{\numberline {25}{\ignorespaces The section of the \textit  {suftab} corresponding to the interval $[6..9]$, the embedded suffixes are highlighted.\relax }}{33}}
\newlabel{fig:esuffixes}{{25}{33}}
\@writefile{lof}{\contentsline {figure}{\numberline {26}{\ignorespaces A window of size 5 applied to the embedded suffixes in Figure \ref  {fig:esuffixes}.\relax }}{33}}
\newlabel{fig:window}{{26}{33}}
\@writefile{lof}{\contentsline {figure}{\numberline {27}{\ignorespaces The suffix table and the inverse suffix table for $S$.\relax }}{34}}
\newlabel{fig:isuftab}{{27}{34}}
\@writefile{lof}{\contentsline {figure}{\numberline {28}{\ignorespaces The embedded suffixes in Figure \ref  {fig:esuffixes} extended by all the suffixes from the window in Figure \ref  {fig:window}.\relax }}{34}}
\newlabel{fig:ewinsuffixes}{{28}{34}}
\citation{DBLP:conf/cpm/KasaiLAAP01}
\@writefile{lof}{\contentsline {figure}{\numberline {29}{\ignorespaces The embedded \textit  {suftab} array for the interval $[6..9]$.\relax }}{35}}
\newlabel{fig:esuftab}{{29}{35}}
\@writefile{lof}{\contentsline {figure}{\numberline {30}{\ignorespaces The embedded \textit  {lcptab} array for the interval $[6..9]$.\relax }}{35}}
\newlabel{fig:elcptab}{{30}{35}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{4.1}{Embedded Suffix Tree}}{36}}
\@writefile{lof}{\contentsline {figure}{\numberline {31}{\ignorespaces The embedded suffix tree for the interval $[6..9]$\relax }}{36}}
\newlabel{fig:est}{{31}{36}}
\@writefile{lot}{\contentsline {table}{\numberline {5}{\ignorespaces Embedded suffix tree properties.\relax }}{36}}
\newlabel{tab:est}{{5}{36}}
\@writefile{lof}{\contentsline {figure}{\numberline {32}{\ignorespaces The embedded binary lcp-interval tree for the interval $[6..9]$.\relax }}{37}}
\newlabel{fig:etree}{{32}{37}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{4.2}{Recursively Embedded Suffix Tree}}{37}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {1}{\ignorespaces $\mathbf  {extract}(\mathbf  {D}, tree)$ - recursive embedding of suffix trees\relax }}{38}}
\newlabel{pro:rest}{{1}{38}}
\@writefile{toc}{\contentsline {part}{\tocpart {Part}{2}{Alignment}}{39}}
\@writefile{toc}{\contentsline {section}{\tocsection {}{5}{Preliminaries}}{39}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{5.1}{Preprocessing}}{39}}
\@writefile{lof}{\contentsline {figure}{\numberline {33}{\ignorespaces A corpus after preprocessing.\relax }}{39}}
\newlabel{fig:corpus}{{33}{39}}
\@writefile{lof}{\contentsline {figure}{\numberline {34}{\ignorespaces A corpus split into documents.\relax }}{40}}
\newlabel{fig:docs}{{34}{40}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{5.2}{Parallel Corpora}}{40}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{5.3}{Alignment}}{40}}
\@writefile{lof}{\contentsline {figure}{\numberline {35}{\ignorespaces A parallel corpus after preprocessing.\relax }}{41}}
\newlabel{fig:pcorpus}{{35}{41}}
\@writefile{lof}{\contentsline {figure}{\numberline {36}{\ignorespaces A parallel corpus split into documents.\relax }}{41}}
\newlabel{fig:pdocs}{{36}{41}}
\citation{Hogben:2006}
\citation{widdows04geometry}
\@writefile{toc}{\contentsline {section}{\tocsection {}{6}{Vector Space Model}}{42}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{6.1}{Vectors}}{42}}
\citation{Hogben:2006}
\citation{Salton:1971:SRS:1102022}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{6.2}{\emph  {term-document} Matrix}}{43}}
\citation{deerwester90indexing}
\citation{DBLP:journals/corr/abs-1003-1141}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{6.3}{\emph  {word\IeC {\textendash }context} Matrix}}{44}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{6.4}{Vector Space Models}}{44}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{6.5}{\emph  {term frequency} $\times $ \emph  {inverse document} Frequency}}{44}}
\@writefile{lof}{\contentsline {figure}{\numberline {37}{\ignorespaces A term-document matrix.\relax }}{45}}
\newlabel{fig:tdmatrix}{{37}{45}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{6.6}{Positive Pointwise Mutual Information}}{46}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{6.7}{Similarity}}{46}}
\citation{Yamamoto:2001:USA:972778.972779}
\@writefile{toc}{\contentsline {section}{\tocsection {}{7}{Alignment of Discontinuous Repeats}}{47}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{7.1}{\emph  {index-document} Mapping}}{47}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {2}{\ignorespaces $\mathbf  {tovector}([i..j], idmap)$ - converting an interval to a repeat vector\relax }}{47}}
\newlabel{pro:tovector}{{2}{47}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{7.2}{\emph  {repeat-context} Matrix}}{48}}
\@writefile{lof}{\contentsline {figure}{\numberline {38}{\ignorespaces Repeat vectors in document space.\relax }}{48}}
\newlabel{fig:rspace}{{38}{48}}
\@writefile{lof}{\contentsline {figure}{\numberline {39}{\ignorespaces Source and target repeat vector comparison.\relax }}{50}}
\newlabel{fig:vectors}{{39}{50}}
\citation{koehn2005epc}
\@writefile{toc}{\contentsline {part}{\tocpart {Part}{3}{Implementation and Testing}}{51}}
\@writefile{toc}{\contentsline {section}{\tocsection {}{8}{Implementation}}{51}}
\@writefile{toc}{\contentsline {section}{\tocsection {}{9}{Testing}}{51}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{9.1}{$2$-$2$ Alignment of Discontinuous Repeats}}{51}}
\@writefile{lot}{\contentsline {table}{\numberline {6}{\ignorespaces A sample of $2$-to-$2$ alignments.\relax }}{51}}
\newlabel{tab:results2-2}{{6}{51}}
\@writefile{lot}{\contentsline {table}{\numberline {7}{\ignorespaces A sample of $2$-to-$2$ alignments with similarity scores.\relax }}{52}}
\newlabel{tab:results}{{7}{52}}
\@writefile{toc}{\contentsline {subsection}{\tocsubsection {}{9.2}{$n$-to-$m$ Alignment of Discontinuous Repeats}}{53}}
\@writefile{lot}{\contentsline {table}{\numberline {8}{\ignorespaces A sample of $3$-to-$3$ alignments.\relax }}{53}}
\newlabel{tab:results3-3}{{8}{53}}
\@writefile{lot}{\contentsline {table}{\numberline {9}{\ignorespaces A sample of $2$-to-$3$ alignments.\relax }}{54}}
\newlabel{tab:results2-3}{{9}{54}}
\@writefile{lot}{\contentsline {table}{\numberline {10}{\ignorespaces A sample of $3$-to-$4$ alignments.\relax }}{54}}
\newlabel{tab:results3-4}{{10}{54}}
\citation{DBLP:books/daglib/0001349}
\@writefile{toc}{\contentsline {section}{\tocsection {}{10}{Conclusion and Future Research Directions}}{55}}
\@writefile{toc}{\contentsline {section}{\tocsection {}{}{Acknowledgments}}{56}}
\citation{*}
\bibdata{sa}
\bibcite{DBLP:journals/jda/AbouelhodaKO04}{Abouelhoda et~al., 2004}
\bibcite{Apostolico2009227}{Apostolico and Satta, 2009}
\bibcite{Burrows94ablock-sorting}{Burrows et~al., 1994}
\bibcite{DBLP:books/daglib/0020103}{Crochemore et~al., 2007}
\bibcite{deerwester90indexing}{Deerwester et~al., 1990}
\bibcite{adjeroh08bwt}{Donald~Adjeroh and Mukherjee, 2008}
\bibcite{Gerdemann:2010}{Gerdemann, 2010}
\bibcite{DBLP:books/cu/Gusfield1997}{Gusfield, 1997}
\bibcite{Hogben:2006}{Hogben, 2006}
\bibcite{Karkkainen:2006}{K\"{a}rkk\"{a}inen et~al., 2006}
\bibcite{DBLP:conf/cpm/KasaiLAAP01}{Kasai et~al., 2001}
\bibcite{DBLP:journals/algorithmica/KimKP08}{Kim et~al., 2008}
\bibcite{koehn2005epc}{Koehn, 2005}
\bibcite{SMT:Koehn2010}{Koehn, 2010}
\bibcite{DBLP:journals/siamcomp/ManberM93}{Manber and Myers, 1993}
\bibcite{McCreight:1976:SST:321941.321946}{McCreight, 1976}
\bibcite{Mcnamee:2006}{Mcnamee and Mayfield, 2006}
\bibcite{Meyer:2000:MAA:343374}{Meyer, 2000}
\bibcite{citeulike:1305383}{Poole, 2005}
\bibcite{Salton:1971:SRS:1102022}{Salton, 1971}
\bibcite{DBLP:books/daglib/0001349}{Trefethen and Bau, 1997}
\bibcite{DBLP:journals/corr/abs-1003-1141}{Turney and Pantel, 2010}
\bibcite{ukkonen1995:suffix}{Ukkonen, 1995}
\bibcite{DBLP:conf/focs/Weiner73}{Weiner, 1973}
\@writefile{toc}{\contentsline {section}{\tocsection {}{}{References}}{57}}
\bibcite{widdows04geometry}{Widdows, 2004}
\bibcite{Yamamoto:2001:USA:972778.972779}{Yamamoto and Church, 2001}
\bibcite{Zhang05anefficient}{Zhang and Vogel, 2005}
\bibstyle{apalike}
\@writefile{toc}{\contentsline {section}{List of Figures}{59}}
\@writefile{toc}{\contentsline {section}{List of Tables}{60}}
\@writefile{toc}{\contentsline {section}{\tocsection {}{}{Index}}{62}}
\newlabel{tocindent-1}{0pt}
\newlabel{tocindent0}{51.04643pt}
\newlabel{tocindent1}{24.94171pt}
\newlabel{tocindent2}{38.47682pt}
\newlabel{tocindent3}{0pt}
